@article{Chen2021EndtoendMV,
  title={End-to-end Multi-modal Video Temporal Grounding},
  author={Yi-Wen Chen and Yi-Hsuan Tsai and Ming-Hsuan Yang},
  journal={ArXiv},
  year={2021},
  volume={abs/2107.05624}
}